Using cuda device
Wrapping the env with a `Monitor` wrapper
Wrapping the env in a DummyVecEnv.
Logging to complexcity_dqn/DQN_1
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 80.8      |
|    ep_rew_mean      | -1.29e+03 |
|    exploration_rate | 0.969     |
| time/               |           |
|    episodes         | 4         |
|    fps              | 27        |
|    time_elapsed     | 11        |
|    total_timesteps  | 323       |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 26.3      |
|    n_updates        | 122       |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 80.5      |
|    ep_rew_mean      | -1.71e+03 |
|    exploration_rate | 0.939     |
| time/               |           |
|    episodes         | 8         |
|    fps              | 27        |
|    time_elapsed     | 23        |
|    total_timesteps  | 644       |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 22.2      |
|    n_updates        | 443       |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 81.8      |
|    ep_rew_mean      | -1.68e+03 |
|    exploration_rate | 0.907     |
| time/               |           |
|    episodes         | 12        |
|    fps              | 27        |
|    time_elapsed     | 35        |
|    total_timesteps  | 982       |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 26.6      |
|    n_updates        | 781       |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 78.2      |
|    ep_rew_mean      | -1.79e+03 |
|    exploration_rate | 0.881     |
| time/               |           |
|    episodes         | 16        |
|    fps              | 27        |
|    time_elapsed     | 45        |
|    total_timesteps  | 1251      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11.1      |
|    n_updates        | 1050      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 76.5      |
|    ep_rew_mean      | -1.64e+03 |
|    exploration_rate | 0.855     |
| time/               |           |
|    episodes         | 20        |
|    fps              | 27        |
|    time_elapsed     | 54        |
|    total_timesteps  | 1529      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11.7      |
|    n_updates        | 1328      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 82.7      |
|    ep_rew_mean      | -1.88e+03 |
|    exploration_rate | 0.811     |
| time/               |           |
|    episodes         | 24        |
|    fps              | 27        |
|    time_elapsed     | 71        |
|    total_timesteps  | 1985      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11.8      |
|    n_updates        | 1784      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 86.8      |
|    ep_rew_mean      | -1.89e+03 |
|    exploration_rate | 0.769     |
| time/               |           |
|    episodes         | 28        |
|    fps              | 27        |
|    time_elapsed     | 86        |
|    total_timesteps  | 2429      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.04      |
|    n_updates        | 2228      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 86.2      |
|    ep_rew_mean      | -1.86e+03 |
|    exploration_rate | 0.738     |
| time/               |           |
|    episodes         | 32        |
|    fps              | 27        |
|    time_elapsed     | 98        |
|    total_timesteps  | 2760      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 23.1      |
|    n_updates        | 2559      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 82.4      |
|    ep_rew_mean      | -1.86e+03 |
|    exploration_rate | 0.718     |
| time/               |           |
|    episodes         | 36        |
|    fps              | 27        |
|    time_elapsed     | 105       |
|    total_timesteps  | 2966      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.14      |
|    n_updates        | 2765      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 83.6      |
|    ep_rew_mean      | -1.86e+03 |
|    exploration_rate | 0.682     |
| time/               |           |
|    episodes         | 40        |
|    fps              | 28        |
|    time_elapsed     | 119       |
|    total_timesteps  | 3344      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11.7      |
|    n_updates        | 3143      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 86.8      |
|    ep_rew_mean      | -2.02e+03 |
|    exploration_rate | 0.637     |
| time/               |           |
|    episodes         | 44        |
|    fps              | 28        |
|    time_elapsed     | 136       |
|    total_timesteps  | 3819      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 22.7      |
|    n_updates        | 3618      |
-----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 92.4     |
|    ep_rew_mean      | -2.3e+03 |
|    exploration_rate | 0.579    |
| time/               |          |
|    episodes         | 48       |
|    fps              | 28       |
|    time_elapsed     | 158      |
|    total_timesteps  | 4436     |
| train/              |          |
|    learning_rate    | 0.0005   |
|    loss             | 12.5     |
|    n_updates        | 4235     |
----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 93.4      |
|    ep_rew_mean      | -2.41e+03 |
|    exploration_rate | 0.538     |
| time/               |           |
|    episodes         | 52        |
|    fps              | 28        |
|    time_elapsed     | 173       |
|    total_timesteps  | 4858      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.6      |
|    n_updates        | 4657      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 90.7      |
|    ep_rew_mean      | -2.36e+03 |
|    exploration_rate | 0.517     |
| time/               |           |
|    episodes         | 56        |
|    fps              | 27        |
|    time_elapsed     | 181       |
|    total_timesteps  | 5080      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 21.7      |
|    n_updates        | 4879      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 96.1      |
|    ep_rew_mean      | -2.47e+03 |
|    exploration_rate | 0.452     |
| time/               |           |
|    episodes         | 60        |
|    fps              | 28        |
|    time_elapsed     | 205       |
|    total_timesteps  | 5768      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.87      |
|    n_updates        | 5567      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 101       |
|    ep_rew_mean      | -2.52e+03 |
|    exploration_rate | 0.387     |
| time/               |           |
|    episodes         | 64        |
|    fps              | 28        |
|    time_elapsed     | 229       |
|    total_timesteps  | 6457      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 27.3      |
|    n_updates        | 6256      |
-----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 101      |
|    ep_rew_mean      | -2.6e+03 |
|    exploration_rate | 0.35     |
| time/               |          |
|    episodes         | 68       |
|    fps              | 28       |
|    time_elapsed     | 243      |
|    total_timesteps  | 6838     |
| train/              |          |
|    learning_rate    | 0.0005   |
|    loss             | 10.7     |
|    n_updates        | 6637     |
----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 108       |
|    ep_rew_mean      | -2.92e+03 |
|    exploration_rate | 0.262     |
| time/               |           |
|    episodes         | 72        |
|    fps              | 28        |
|    time_elapsed     | 277       |
|    total_timesteps  | 7773      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 25.4      |
|    n_updates        | 7572      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 108       |
|    ep_rew_mean      | -2.88e+03 |
|    exploration_rate | 0.219     |
| time/               |           |
|    episodes         | 76        |
|    fps              | 28        |
|    time_elapsed     | 293       |
|    total_timesteps  | 8224      |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.77      |
|    n_updates        | 8023      |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 129       |
|    ep_rew_mean      | -3.07e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 80        |
|    fps              | 28        |
|    time_elapsed     | 367       |
|    total_timesteps  | 10325     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.6      |
|    n_updates        | 10124     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 167       |
|    ep_rew_mean      | -3.95e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 84        |
|    fps              | 28        |
|    time_elapsed     | 498       |
|    total_timesteps  | 14043     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.4      |
|    n_updates        | 13842     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 178       |
|    ep_rew_mean      | -4.07e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 88        |
|    fps              | 28        |
|    time_elapsed     | 555       |
|    total_timesteps  | 15672     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.04      |
|    n_updates        | 15471     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 204       |
|    ep_rew_mean      | -4.57e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 92        |
|    fps              | 28        |
|    time_elapsed     | 664       |
|    total_timesteps  | 18793     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11.4      |
|    n_updates        | 18592     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 206       |
|    ep_rew_mean      | -4.49e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 96        |
|    fps              | 28        |
|    time_elapsed     | 699       |
|    total_timesteps  | 19787     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 6.04      |
|    n_updates        | 19586     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 229       |
|    ep_rew_mean      | -5.67e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 100       |
|    fps              | 28        |
|    time_elapsed     | 807       |
|    total_timesteps  | 22881     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 7.54      |
|    n_updates        | 22680     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 250       |
|    ep_rew_mean      | -5.96e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 104       |
|    fps              | 28        |
|    time_elapsed     | 892       |
|    total_timesteps  | 25284     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 5.8       |
|    n_updates        | 25083     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 259       |
|    ep_rew_mean      | -6.14e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 108       |
|    fps              | 28        |
|    time_elapsed     | 937       |
|    total_timesteps  | 26564     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 6.14      |
|    n_updates        | 26363     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 267       |
|    ep_rew_mean      | -6.27e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 112       |
|    fps              | 28        |
|    time_elapsed     | 976       |
|    total_timesteps  | 27670     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.47      |
|    n_updates        | 27469     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 273       |
|    ep_rew_mean      | -6.39e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 116       |
|    fps              | 28        |
|    time_elapsed     | 1006      |
|    total_timesteps  | 28544     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 12.1      |
|    n_updates        | 28343     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 280       |
|    ep_rew_mean      | -6.63e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 120       |
|    fps              | 28        |
|    time_elapsed     | 1040      |
|    total_timesteps  | 29524     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 6.69      |
|    n_updates        | 29323     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 296       |
|    ep_rew_mean      | -6.65e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 124       |
|    fps              | 28        |
|    time_elapsed     | 1112      |
|    total_timesteps  | 31595     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 23.6      |
|    n_updates        | 31394     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 348       |
|    ep_rew_mean      | -5.77e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 128       |
|    fps              | 28        |
|    time_elapsed     | 1305      |
|    total_timesteps  | 37217     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.01      |
|    n_updates        | 37016     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 355       |
|    ep_rew_mean      | -5.94e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 132       |
|    fps              | 28        |
|    time_elapsed     | 1343      |
|    total_timesteps  | 38274     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 17.1      |
|    n_updates        | 38073     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 363       |
|    ep_rew_mean      | -6.06e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 136       |
|    fps              | 28        |
|    time_elapsed     | 1379      |
|    total_timesteps  | 39300     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 14.2      |
|    n_updates        | 39099     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 370       |
|    ep_rew_mean      | -6.13e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 140       |
|    fps              | 28        |
|    time_elapsed     | 1415      |
|    total_timesteps  | 40306     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 12.2      |
|    n_updates        | 40105     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 385       |
|    ep_rew_mean      | -6.33e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 144       |
|    fps              | 28        |
|    time_elapsed     | 1486      |
|    total_timesteps  | 42321     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.3      |
|    n_updates        | 42120     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 386       |
|    ep_rew_mean      | -6.21e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 148       |
|    fps              | 28        |
|    time_elapsed     | 1510      |
|    total_timesteps  | 43009     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 12.7      |
|    n_updates        | 42808     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 398       |
|    ep_rew_mean      | -5.97e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 152       |
|    fps              | 28        |
|    time_elapsed     | 1570      |
|    total_timesteps  | 44707     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 14.2      |
|    n_updates        | 44506     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 410       |
|    ep_rew_mean      | -6.17e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 156       |
|    fps              | 28        |
|    time_elapsed     | 1621      |
|    total_timesteps  | 46125     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 14.3      |
|    n_updates        | 45924     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 448       |
|    ep_rew_mean      | -6.27e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 160       |
|    fps              | 28        |
|    time_elapsed     | 1778      |
|    total_timesteps  | 50598     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.8       |
|    n_updates        | 50397     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 466       |
|    ep_rew_mean      | -6.52e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 164       |
|    fps              | 28        |
|    time_elapsed     | 1865      |
|    total_timesteps  | 53036     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 15.1      |
|    n_updates        | 52835     |
-----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 486      |
|    ep_rew_mean      | -6.7e+03 |
|    exploration_rate | 0.05     |
| time/               |          |
|    episodes         | 168      |
|    fps              | 28       |
|    time_elapsed     | 1948     |
|    total_timesteps  | 55422    |
| train/              |          |
|    learning_rate    | 0.0005   |
|    loss             | 13.4     |
|    n_updates        | 55221    |
----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 488       |
|    ep_rew_mean      | -6.62e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 172       |
|    fps              | 28        |
|    time_elapsed     | 1990      |
|    total_timesteps  | 56619     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.21      |
|    n_updates        | 56418     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 497       |
|    ep_rew_mean      | -6.59e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 176       |
|    fps              | 28        |
|    time_elapsed     | 2036      |
|    total_timesteps  | 57921     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.7      |
|    n_updates        | 57720     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 501       |
|    ep_rew_mean      | -6.41e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 180       |
|    fps              | 28        |
|    time_elapsed     | 2122      |
|    total_timesteps  | 60379     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 11        |
|    n_updates        | 60178     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 473       |
|    ep_rew_mean      | -5.49e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 184       |
|    fps              | 28        |
|    time_elapsed     | 2158      |
|    total_timesteps  | 61379     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.97      |
|    n_updates        | 61178     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 471       |
|    ep_rew_mean      | -5.43e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 188       |
|    fps              | 28        |
|    time_elapsed     | 2206      |
|    total_timesteps  | 62764     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.9      |
|    n_updates        | 62563     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 447       |
|    ep_rew_mean      | -4.99e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 192       |
|    fps              | 28        |
|    time_elapsed     | 2233      |
|    total_timesteps  | 63542     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.43      |
|    n_updates        | 63341     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 456       |
|    ep_rew_mean      | -5.01e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 196       |
|    fps              | 28        |
|    time_elapsed     | 2300      |
|    total_timesteps  | 65396     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.49      |
|    n_updates        | 65195     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 436       |
|    ep_rew_mean      | -3.78e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 200       |
|    fps              | 28        |
|    time_elapsed     | 2338      |
|    total_timesteps  | 66478     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.22      |
|    n_updates        | 66277     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 423       |
|    ep_rew_mean      | -3.69e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 204       |
|    fps              | 28        |
|    time_elapsed     | 2376      |
|    total_timesteps  | 67544     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.6      |
|    n_updates        | 67343     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 452       |
|    ep_rew_mean      | -3.74e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 208       |
|    fps              | 28        |
|    time_elapsed     | 2526      |
|    total_timesteps  | 71804     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 7.62      |
|    n_updates        | 71603     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 447       |
|    ep_rew_mean      | -3.71e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 212       |
|    fps              | 28        |
|    time_elapsed     | 2545      |
|    total_timesteps  | 72355     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 9.89      |
|    n_updates        | 72154     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 452       |
|    ep_rew_mean      | -3.67e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 216       |
|    fps              | 28        |
|    time_elapsed     | 2593      |
|    total_timesteps  | 73696     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 5.2       |
|    n_updates        | 73495     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 482       |
|    ep_rew_mean      | -3.96e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 220       |
|    fps              | 28        |
|    time_elapsed     | 2735      |
|    total_timesteps  | 77758     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 7.05      |
|    n_updates        | 77557     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 506       |
|    ep_rew_mean      | -4.33e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 224       |
|    fps              | 28        |
|    time_elapsed     | 2893      |
|    total_timesteps  | 82218     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 10.5      |
|    n_updates        | 82017     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 468       |
|    ep_rew_mean      | -5.44e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 228       |
|    fps              | 28        |
|    time_elapsed     | 2957      |
|    total_timesteps  | 84029     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 14.4      |
|    n_updates        | 83828     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 485       |
|    ep_rew_mean      | -5.66e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 232       |
|    fps              | 28        |
|    time_elapsed     | 3053      |
|    total_timesteps  | 86796     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 7.26      |
|    n_updates        | 86595     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 509       |
|    ep_rew_mean      | -5.43e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 236       |
|    fps              | 28        |
|    time_elapsed     | 3174      |
|    total_timesteps  | 90200     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 24        |
|    n_updates        | 89999     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 526       |
|    ep_rew_mean      | -5.46e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 240       |
|    fps              | 28        |
|    time_elapsed     | 3270      |
|    total_timesteps  | 92922     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 12        |
|    n_updates        | 92721     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 516       |
|    ep_rew_mean      | -5.32e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 244       |
|    fps              | 28        |
|    time_elapsed     | 3306      |
|    total_timesteps  | 93950     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.18      |
|    n_updates        | 93749     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 526       |
|    ep_rew_mean      | -5.39e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 248       |
|    fps              | 28        |
|    time_elapsed     | 3367      |
|    total_timesteps  | 95654     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.28      |
|    n_updates        | 95453     |
-----------------------------------
-----------------------------------
| rollout/            |           |
|    ep_len_mean      | 540       |
|    ep_rew_mean      | -6.07e+03 |
|    exploration_rate | 0.05      |
| time/               |           |
|    episodes         | 252       |
|    fps              | 28        |
|    time_elapsed     | 3474      |
|    total_timesteps  | 98685     |
| train/              |           |
|    learning_rate    | 0.0005    |
|    loss             | 8.19      |
|    n_updates        | 98484     |
-----------------------------------
 100% ━━━━━━━━━━━━━━━━━━━━━━━━━ 100,000/100,000  [ 0:58:41 < 0:00:00 , 29 it/s ]

Done Learning!!

1
